{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "3c671bff",
   "metadata": {},
   "outputs": [],
   "source": [
    "import jieba\n",
    "\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib.ticker as ticker\n",
    "import pandas as pd\n",
    "\n",
    "plt.rcParams['font.sans-serif']=[u'SimHei']\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "c77828a1",
   "metadata": {},
   "outputs": [],
   "source": [
    "data=pd.read_csv(\"动漫评价数据集/anime_t.csv\",encoding=\"utf-8\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "a27278a3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>user_id</th>\n",
       "      <th>subject_id</th>\n",
       "      <th>status</th>\n",
       "      <th>date</th>\n",
       "      <th>rate</th>\n",
       "      <th>tag</th>\n",
       "      <th>comment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>173791</td>\n",
       "      <td>22588</td>\n",
       "      <td>do</td>\n",
       "      <td>2012-4-5</td>\n",
       "      <td>0</td>\n",
       "      <td></td>\n",
       "      <td>喜欢海赖先生~~~~~</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>173791</td>\n",
       "      <td>20582</td>\n",
       "      <td>do</td>\n",
       "      <td>2012-2-10</td>\n",
       "      <td>0</td>\n",
       "      <td></td>\n",
       "      <td>等待中。。。。着急</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>173791</td>\n",
       "      <td>24790</td>\n",
       "      <td>do</td>\n",
       "      <td>2012-2-10</td>\n",
       "      <td>0</td>\n",
       "      <td></td>\n",
       "      <td>快点出</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>173791</td>\n",
       "      <td>10440</td>\n",
       "      <td>do</td>\n",
       "      <td>2011-5-14</td>\n",
       "      <td>0</td>\n",
       "      <td></td>\n",
       "      <td>看着很纠结</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>173791</td>\n",
       "      <td>1671</td>\n",
       "      <td>do</td>\n",
       "      <td>2011-2-18</td>\n",
       "      <td>0</td>\n",
       "      <td></td>\n",
       "      <td>看了1集，继续看</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9218398</th>\n",
       "      <td>227902</td>\n",
       "      <td>230914</td>\n",
       "      <td>collect</td>\n",
       "      <td>2021-2-2</td>\n",
       "      <td>9</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9218399</th>\n",
       "      <td>227902</td>\n",
       "      <td>285901</td>\n",
       "      <td>collect</td>\n",
       "      <td>2021-2-2</td>\n",
       "      <td>9</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9218400</th>\n",
       "      <td>227902</td>\n",
       "      <td>282433</td>\n",
       "      <td>collect</td>\n",
       "      <td>2021-2-2</td>\n",
       "      <td>9</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9218401</th>\n",
       "      <td>227902</td>\n",
       "      <td>246001</td>\n",
       "      <td>collect</td>\n",
       "      <td>2021-2-2</td>\n",
       "      <td>8</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9218402</th>\n",
       "      <td>227902</td>\n",
       "      <td>285666</td>\n",
       "      <td>collect</td>\n",
       "      <td>2021-2-2</td>\n",
       "      <td>9</td>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>9218403 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "         user_id  subject_id   status       date  rate tag       comment\n",
       "0         173791       22588       do   2012-4-5     0       喜欢海赖先生~~~~~\n",
       "1         173791       20582       do  2012-2-10     0         等待中。。。。着急\n",
       "2         173791       24790       do  2012-2-10     0               快点出\n",
       "3         173791       10440       do  2011-5-14     0             看着很纠结\n",
       "4         173791        1671       do  2011-2-18     0          看了1集，继续看\n",
       "...          ...         ...      ...        ...   ...  ..           ...\n",
       "9218398   227902      230914  collect   2021-2-2     9                  \n",
       "9218399   227902      285901  collect   2021-2-2     9                  \n",
       "9218400   227902      282433  collect   2021-2-2     9                  \n",
       "9218401   227902      246001  collect   2021-2-2     8                  \n",
       "9218402   227902      285666  collect   2021-2-2     9                  \n",
       "\n",
       "[9218403 rows x 7 columns]"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dafd36be",
   "metadata": {},
   "outputs": [],
   "source": [
    "data[\"comment\"]"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
